This is a detailed summary from the Global Terrorist Database and therein India specific analysis as well.

Global Most of the cities in Iraq and Somalia are having the high numbers. * We also see cities like Colombo(LTTE), Medellin(Escobar)

Global Citizens/Police/Military are the maximum casualty.

Global Police/Military/Govt are the main targets.

India Police are the main targets of attacks and the attacks in Kashmir/Punjab are evidence. * Informats and Political rallies are also key targets.

Now let see if we can see any trend in the usage of “weaptype1_txt” over the years.

---
title: "Analysis of terrorist attacks across the world"
output: html_notebook
theme: simplex
---

```{r global_options, include=FALSE}
knitr::opts_chunk$set(fig.width=6, fig.asp=0.618,out.width = "70%",fig.align ="center",echo=FALSE, warning=FALSE, message=FALSE, rows.print=30,cols.print=10)

```


```{r load_libs}
library(tidyverse)
library(readxl)
library(data.table)
library(treemap)
library(ggplot2)
library(gridExtra)
theme_set(theme_gray())
# library(readr)

theme_set(ggthemes::theme_fivethirtyeight(12) +  theme(plot.title = element_text(face = "bold"),text = element_text(family = "Arial")))
#geom_col(fill="#4779C7")+



```

```{r}
df<-fread("/Users/vinaychuri/VINAY/dataset/terrorist/globalterrorismdb_0718dist.csv")
df<-df%>%filter(nkill>0)
```

```{r,include=FALSE}
glimpse(df)
```

This is a detailed summary from the Global Terrorist Database and therein India specific analysis as well.

```{r ,fig.cap="Trend across the years", fig.width=6.2,fig.height=3.2}
p1<-df%>%
  count(iyear)%>%
  ggplot(aes(iyear,n))+
  scale_x_continuous(breaks=seq(1970, 2017, by = 5))+
  geom_line()+
  labs(title="Trend across the years",subtitle="Global",x="Year",y="Counts")

p2<-df%>%
  filter(country_txt=='India')%>%
  count(iyear)%>%
  ggplot(aes(iyear,n))+
  scale_x_continuous(breaks=seq(1970, 2017, by = 5))+
  geom_line()+
  labs(title="Trend across the years",subtitle="India",x="Year",y="Counts")

grid.arrange(p1,p2,ncol=1)
rm(p1,p2)

```

* Globally, we see that there is an exponential increase in attacks from 2012 onwards and it has skyrocketed.
* India has seen spikes in 1985-86 due to Kashmir & 2007-09 due to the Mumbai attacks.



```{r , fig.width=6.2}

df%>%
  group_by(country_txt)%>%
  summarise(nkill=sum(nkill))%>%
  top_n(n=50,wt=nkill)%>%
  ungroup()%>%
  select(country_txt,nkill)%>%
  treemap(index="country_txt",vSize = "nkill",title = "Summary of kills per country(Top 50)",palette = "Accent")



df %>%
  group_by(country_txt) %>%
  summarise(nk = sum(nkill)) %>%
  top_n(50, wt = nk) %>%
  ungroup -> dfkp_top

df %>% 
  filter(country_txt %in% dfkp_top$country_txt) %>% 
  group_by(country_txt, iyear) %>% 
  summarise(nk = sum(nkill)) %>% 
  ungroup -> dfkp


treemap(
  dfkp,
  #Your data frame object
  index = c("country_txt", "iyear"),
  type = "value",
  vSize = "nk",
  vColor = "nk",
  palette = "RdBu",
  title = "Killings in Country/Years-Global (Top 50)",
  title.legend = "Number of killed",
  fontsize.title = 10
)

rm(dfkp,dfkp_top)

```

* Iraq has seen the most number of attacks and they have high casualty.
* Iraq, Afghanistan, Pakistan,Syria are all related to the Global war on terror, ISIS.
* India numbers are related to all the Pakistan terrorist attacks.
* Sri Lanka numbers are from the LTTE wars
* Nigeria/Somalia are from the Civil wars and Boko Haram terrorist attacks.
* United States is related to 9/11 attacks. IT has the low killed numbers but high on the wounded.
* Colombia is likely Escobar and the drug related gang wars.


```{r , fig.width=6.2}

df%>%
  filter(nkill>0)%>%
  select(region_txt,nkill)%>%
  treemap(index="region_txt",vSize = "nkill",title = "Summary of kills per region",palette = "Set1")
```

* Middle East/Africa are the center of Civil wars and Global terrorist regions.
* South Asia will include India,Pakistan, Afghanistan


```{r , fig.width=6.2}
df %>%
  filter(nkill > 0) %>%
  group_by(provstate) %>%
  summarise(nk = sum(nkill)) %>%
  top_n(50, wt = nk) %>%
  ungroup -> dfkp_top

df %>% 
  filter(nkill>0)%>%
  filter(provstate %in% dfkp_top$provstate) %>% 
  group_by(provstate, iyear) %>% 
  summarise(nk = sum(nkill)) %>% 
  ungroup -> dfkp


treemap(
  dfkp,
  #Your data frame object
  index = c("provstate", "iyear"),
  type = "value",
  vSize = "nk",
  vColor = "nk",
  palette = "RdBu",
  title = "Killings in Provinces/Years-Global",
  title.legend = "Number of killed",
  fontsize.title = 10
)


df %>%
  filter(nkill > 0 & country_txt=='India') %>%
  group_by(provstate) %>%
  summarise(nk = sum(nkill)) %>%
  top_n(50, wt = nk) %>%
  ungroup -> dfkp_top

df %>% 
  filter(nkill>0 & country_txt=='India')%>%
  filter(provstate %in% dfkp_top$provstate) %>% 
  group_by(provstate, iyear) %>% 
  summarise(nk = sum(nkill)) %>% 
  ungroup -> dfkp


treemap(
  dfkp,
  #Your data frame object
  index = c("provstate", "iyear"),
  type = "value",
  vSize = "nk",
  vColor = "nk",
  palette = "RdBu",
  title = "Killings in Provinces/Years-India",
  title.legend = "Number of killed",
  fontsize.title = 10
)

rm(dfkp,dfkp_top)
```

* Global
  * As we saw from the country graph, Iraq=Baghdad/Ninewah/Al Anbar/Saladin are the highest in the kill number.
  * Borno is Nigeria
  * Punjab in India saw the highest terrorist attacks during the Pakistan and Khalistan movement.
  * New York has the highest killed during the 9/11
* India
  * As we saw earlier, J&K and Punjab started the trend of violence.
  * Maoist have seen their rise in Assam/Chhattisgarh/Maharashtra etc. 


```{r,fig.width=6.2}

df %>%
  filter(nkill > 0) %>%
  group_by(city) %>%
  summarise(nk = sum(nkill)) %>%
  top_n(50, wt = nk) %>%
  ungroup -> dfkp_top

df %>% 
  filter(nkill>0)%>%
  filter(city %in% dfkp_top$city) %>% 
  group_by(city, iyear) %>% 
  summarise(nk = sum(nkill)) %>% 
  ungroup -> dfkp


treemap(
  dfkp,
  #Your data frame object
  index = c("city", "iyear"),
  type = "value",
  vSize = "nk",
  vColor = "nk",
  palette = "RdBu",
  title = "Killings in City/Years-Global",
  title.legend = "Number of killed",
  fontsize.title = 10
)


df %>%
  filter(nkill > 0 & country_txt=='India') %>%
  group_by(city) %>%
  summarise(nk = sum(nkill)) %>%
  top_n(50, wt = nk) %>%
  ungroup -> dfkp_top

df %>% 
  filter(nkill > 0 & country_txt=='India') %>%
  filter(city %in% dfkp_top$city) %>% 
  group_by(city, iyear) %>% 
  summarise(nk = sum(nkill)) %>% 
  ungroup -> dfkp


treemap(
  dfkp,
  #Your data frame object
  index = c("city", "iyear"),
  type = "value",
  vSize = "nk",
  vColor = "nk",
  palette = "RdBu",
  title = "Killings in City/Years-India",
  title.legend = "Number of killed",
  fontsize.title = 10
)

rm(dfkp,dfkp_top)
```

*Global
  * Most of the cities in Iraq and Somalia are having the high numbers.
  * We also see cities like Colombo(LTTE), Medellin(Escobar)

* India
  * Cities across J&K + Punjab are seen along with Mumbai after the Mumbai blasts.
  


```{r}
df%>%
  group_by(attacktype1_txt)%>%
  summarise(nkill=sum(nkill))%>%
  ungroup()%>%
  ggplot(aes(reorder(attacktype1_txt,nkill),nkill))+
  geom_col()+
  coord_flip()+
  labs(title="Trend across attacktype",x="attacktype",y="Counts")

df%>%
  group_by(targtype1_txt)%>%
  summarise(nkill=sum(nkill))%>%
  ungroup()%>%
  ggplot(aes(reorder(targtype1_txt,nkill),nkill))+
  geom_col()+
  coord_flip()+
  scale_y_continuous(labels=scales::comma)+
  labs(title="Trend across targtype",x="targtype",y="Counts")


df%>%
  group_by(attacktype1_txt,targtype1_txt)%>%
  summarise(nkill=sum(nkill))%>%
  ungroup()%>%
  treemap(index=c("attacktype1_txt","targtype1_txt"),vSize = "nkill",title = "Summary of kills by attack type and target",palette = "Set2")



```

*Global
  * Citizens/Police/Military are the maximum casualty.



 
```{r , fig.height=4,fig.width=6}
df$targsubtype1_txt<- replace_na(df$targsubtype1_txt, 'Not Known')

p1<-df%>%
  count(targsubtype1_txt,sort=T)%>%
  head(30)%>%
  ggplot(aes(reorder(targsubtype1_txt,n),n))+
  geom_col()+
  coord_flip()+
  labs(title="Trend across targsubtype Globally",x="targsubtype",y="Counts")

p2<-df%>%
  filter(country_txt=='India')%>%
  count(targsubtype1_txt,sort=T)%>%
  head(30)%>%
  ggplot(aes(reorder(targsubtype1_txt,n),n))+
  geom_col()+
  coord_flip()+
  labs(title="Trend across targsubtype in India",x="targsubtype",y="Counts")

grid.arrange(p1,p2,ncol=1)
rm(p1,p2)


```

*Global
  * Police/Military/Govt are the main targets.

*India
  * Police are the main targets of attacks and the attacks in Kashmir/Punjab are evidence.
  * Informats and Political rallies are also key targets.


```{r , fig.height=4,fig.width=6}
p1<-df%>%
  count(weaptype1_txt,sort=T)%>%
  head(30)%>%
  ggplot(aes(reorder(weaptype1_txt,n),n))+
  geom_col()+
  coord_flip()+
  labs(title="Trend across weaptype",subtitle="Globally",x="weaptype",y="Counts")


p2<-df%>%
  filter(country_txt=='India')%>%
  count(weaptype1_txt,sort=T)%>%
  head(30)%>%
  ggplot(aes(reorder(weaptype1_txt,n),n))+
  geom_col()+
  coord_flip()+
  labs(title="Trend across weaptype",subtitle="India",x="weaptype",y="Counts")

grid.arrange(p1,p2)
rm(p1,p2)
```

```{r}
df$weapsubtype1_txt<- replace_na(df$weapsubtype1_txt, 'Not Known')

df%>%
  count(weapsubtype1_txt,sort=T)%>%
  head(30)%>%
  ggplot(aes(reorder(weapsubtype1_txt,n),n))+
  geom_col()+
  coord_flip()+
  labs(title="Trend across weapsubtype",x="weapsubtype",y="Counts")




```



```{r}
df$weapdetail<- replace_na(df$weapdetail,"Not Known")
df%>%
  count(weapdetail,sort=T)%>%
  head(30)%>%
  ggplot(aes(reorder(weapdetail,n),n))+
  geom_col()+
  coord_flip()+
  labs(title="Trend across weapdetail",x="weapdetail",y="Counts")


```


Now let see if we can see any trend in the usage of "weaptype1_txt" over the years.

```{r,fig.width=6.2,fig.height=3}
# df%>%
#   group_by(weaptype1_txt,iyear)%>%
#   summarise(nkill=sum(nkill))%>%
#   ggplot(aes(iyear,nkill))+
#   geom_col()+
#   facet_wrap(~weaptype1_txt)


df %>%
  group_by(weaptype1_txt, iyear) %>%
  summarise(nkill = sum(nkill)) %>%
  ungroup() %>%
  ggplot(aes(x = iyear, y = nkill)) +
  geom_col()+
  labs(title="Trend across weaptype1_txt-Global",y="weaptype1_txt",x="Counts")+
  facet_wrap( ~ weaptype1_txt, scales = "free_y")


df %>%
  filter(country_txt=='India')%>%
  group_by(weaptype1_txt, iyear) %>%
  summarise(nkill = sum(nkill)) %>%
  ungroup() %>%
  ggplot(aes(x = iyear, y = nkill)) +
  geom_col()+
  labs(title="Trend across weaptype1_txt-India",y="weaptype1_txt",x="Counts")+
  facet_wrap( ~ weaptype1_txt, scales = "free_y")

```





